#pragma OPENCL EXTENSION cl_khr_fp16 : enable
#pragma OPENCL EXTENSION cl_khr_subgroups : enable

__kernel void test_reduce_add(__global int* out, __global int* in) {
    int val = in[get_global_id(0)];
    int sum = sub_group_reduce_add(val);
    out[get_global_id(0)] = sum;
}
